CUDA_VISIBLE_DEVICES=5 python src/train_dynamic_language_model.py trainer.accelerator="gpu" \
                              data.batch_size=1 \
                              logger=tensorboard \
                              trainer.val_check_interval=6400  \
                              trainer.accumulate_grad_batches=32 \
                              trainer.max_epochs=40 \
                              model.optimizer.lr=0.0001 \
                              paths.log_dir="/mnt/c8cdfbea-cfca-4bcf-97e2-1071164c0072/UserData/wangzeyuan/logs" \
                            #   callbacks.model_checkpoint.save_weights_only=True \
                              # model.ckpt_path="/home/zhangqiang/userdata/wangzeyuan/Dynamic/Dynamic.Training/logs/train_dynamic_language_model/runs/2025-05-08_16-30-13/checkpoints/epoch_002.ckpt"